# coding: utf-8

import numpy as np
import pandas as pd
import matplotlib.pyplot as plt
from scipy.io import arff
from sklearn.preprocessing import MinMaxScaler
from sklearn.preprocessing import StandardScaler


file_name=r'C:\Users\LDK‘s PC\Desktop\大三上工程研究与实习\机器学习\data\arff\AEEEM\EQ.arff'
data,meta=arff.loadarff(file_name)
df=pd.DataFrame(data)
pd.set_option('display.max_columns',888)
pd.set_option('display.width',1000)
# print(df.head())
# print(df.info())
# 查看表的基本数据分布
# print(df.describe())
# 查看重复值
# print(df[df.duplicated()])
# 删除重复值
# df.drop_duplicates(inplace=True)
# print(df.info())





